\contentsline {section}{\numberline {1}Introduction}{4}
\contentsline {section}{\numberline {2}Log Laplace review and MLE derivation}{6}
\contentsline {section}{\numberline {3}Assymetric Exponential Power Distribution, Review and MLE derivation}{11}
\contentsline {section}{\numberline {4}CUDA programming review}{14}
\contentsline {subsection}{\numberline {4.1}CUDA threads architecture and control}{14}
\contentsline {subsection}{\numberline {4.2}GPU memory}{16}
\contentsline {section}{\numberline {5}Parallel Computing in CUDA}{19}
\contentsline {subsection}{\numberline {5.1}Motivation for Acceleration}{19}
\contentsline {subsection}{\numberline {5.2}Sequential Programming in C++}{20}
\contentsline {subsection}{\numberline {5.3}Parallel Programming in CUDA}{21}
\contentsline {subsection}{\numberline {5.4}Results}{22}
\contentsline {section}{\numberline {6}GPGPU Techniques and Results}{24}
\contentsline {subsection}{\numberline {6.1}Identifying the Bottleneck}{24}
\contentsline {subsection}{\numberline {6.2}General GPGPU techniques}{25}
\contentsline {subsection}{\numberline {6.3}Acceleration Techniques: Summing GPGPU threads}{27}
\contentsline {subsection}{\numberline {6.4}Acceleration Techniques: GPU Memory}{33}
\contentsline {subsection}{\numberline {6.5}Acceleration Techniques: OPENMP + CUDA}{36}
\contentsline {section}{\numberline {7}Acceleration Using Properties of Data}{39}
\contentsline {subsection}{\numberline {7.1}Lookup Table Implementation}{39}
